%matplotlib inline
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

plt.style.use('ggplot')
plt.rcParams['figure.figsize'] = (15, 3)
plt.rcParams['font.family'] = 'sans-serif'


weather_2012_final = pd.read_csv('../data/weather_2012.csv', index_col='Date/Time')
weather_2012_final['Temp (C)'].plot(figsize=(15, 6))

<matplotlib.axes._subplots.AxesSubplot at 0x114b819a0>


url_template = "http://climate.weather.gc.ca/climateData/bulkdata_e.html?format=csv&stationID=5415&Year={year}&Month={month}&timeframe=1&submit=Download+Data"


#url = url_template.format(month=3, year=2012)
#weather_mar2012 = pd.read_csv(url, skiprows=15, index_col='Date/Time', parse_dates=True, encoding='latin1', header=True)

# because the url is broken, we use our saved dataframe for now
weather_mar2012 = pd.read_csv('../data/weather_2012.csv')


weather_mar2012


weather_mar2012[u"Temp (C)"].plot(figsize=(15, 5))

<matplotlib.axes._subplots.AxesSubplot at 0x1150d5250>


weather_mar2012.columns = [
    u'Year', u'Month', u'Day', u'Time', u'Data Quality', u'Temp (C)', 
    u'Temp Flag', u'Dew Point Temp (C)', u'Dew Point Temp Flag', 
    u'Rel Hum (%)', u'Rel Hum Flag', u'Wind Dir (10s deg)', u'Wind Dir Flag', 
    u'Wind Spd (km/h)', u'Wind Spd Flag', u'Visibility (km)', u'Visibility Flag',
    u'Stn Press (kPa)', u'Stn Press Flag', u'Hmdx', u'Hmdx Flag', u'Wind Chill', 
    u'Wind Chill Flag', u'Weather']

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-24-e81e0193d388> in <module>
----> 1 weather_mar2012.columns = [
      2     u'Year', u'Month', u'Day', u'Time', u'Data Quality', u'Temp (C)',
      3     u'Temp Flag', u'Dew Point Temp (C)', u'Dew Point Temp Flag',
      4     u'Rel Hum (%)', u'Rel Hum Flag', u'Wind Dir (10s deg)', u'Wind Dir Flag',
      5     u'Wind Spd (km/h)', u'Wind Spd Flag', u'Visibility (km)', u'Visibility Flag',

~/.virtualenvs/cookbook/lib/python3.8/site-packages/pandas/core/generic.py in __setattr__(self, name, value)
   5141         try:
   5142             object.__getattribute__(self, name)
-> 5143             return object.__setattr__(self, name, value)
   5144         except AttributeError:
   5145             pass

pandas/_libs/properties.pyx in pandas._libs.properties.AxisProperty.__set__()

~/.virtualenvs/cookbook/lib/python3.8/site-packages/pandas/core/generic.py in _set_axis(self, axis, labels)
    562     def _set_axis(self, axis: int, labels: Index) -> None:
    563         labels = ensure_index(labels)
--> 564         self._mgr.set_axis(axis, labels)
    565         self._clear_item_cache()
    566 

~/.virtualenvs/cookbook/lib/python3.8/site-packages/pandas/core/internals/managers.py in set_axis(self, axis, new_labels)
    214 
    215         if new_len != old_len:
--> 216             raise ValueError(
    217                 f"Length mismatch: Expected axis has {old_len} elements, new "
    218                 f"values have {new_len} elements"

ValueError: Length mismatch: Expected axis has 8 elements, new values have 24 elements


weather_mar2012 = weather_mar2012.dropna(axis=1, how='any')
weather_mar2012[:5]


weather_mar2012 = weather_mar2012.drop(['Year', 'Month', 'Day', 'Time', 'Data Quality'], axis=1)
weather_mar2012[:5]


temperatures = weather_mar2012[[u'Temp (C)']].copy()
print(temperatures.head)
temperatures.loc[:,'Hour'] = weather_mar2012.index.hour
temperatures.groupby('Hour').aggregate(np.median).plot()

<bound method DataFrame.head of                      Temp (C)
Date/Time                    
2012-03-01 00:00:00      -5.5
2012-03-01 01:00:00      -5.7
2012-03-01 02:00:00      -5.4
2012-03-01 03:00:00      -4.7
2012-03-01 04:00:00      -5.4
2012-03-01 05:00:00      -5.3
2012-03-01 06:00:00      -5.2
2012-03-01 07:00:00      -4.9
2012-03-01 08:00:00      -5.0
2012-03-01 09:00:00      -4.9
2012-03-01 10:00:00      -4.7
2012-03-01 11:00:00      -4.4
2012-03-01 12:00:00      -4.3
2012-03-01 13:00:00      -4.3
2012-03-01 14:00:00      -3.9
2012-03-01 15:00:00      -3.3
2012-03-01 16:00:00      -2.7
2012-03-01 17:00:00      -2.9
2012-03-01 18:00:00      -3.0
2012-03-01 19:00:00      -3.6
2012-03-01 20:00:00      -3.7
2012-03-01 21:00:00      -3.9
2012-03-01 22:00:00      -4.3
2012-03-01 23:00:00      -4.3
2012-03-02 00:00:00      -4.8
2012-03-02 01:00:00      -5.3
2012-03-02 02:00:00      -5.2
2012-03-02 03:00:00      -5.5
2012-03-02 04:00:00      -5.6
2012-03-02 05:00:00      -5.5
...                       ...
2012-03-30 18:00:00       3.9
2012-03-30 19:00:00       3.1
2012-03-30 20:00:00       3.0
2012-03-30 21:00:00       1.7
2012-03-30 22:00:00       0.4
2012-03-30 23:00:00       1.4
2012-03-31 00:00:00       1.5
2012-03-31 01:00:00       1.3
2012-03-31 02:00:00       1.3
2012-03-31 03:00:00       0.7
2012-03-31 04:00:00      -0.9
2012-03-31 05:00:00      -0.6
2012-03-31 06:00:00      -0.5
2012-03-31 07:00:00      -0.3
2012-03-31 08:00:00       0.7
2012-03-31 09:00:00       1.5
2012-03-31 10:00:00       2.9
2012-03-31 11:00:00       4.6
2012-03-31 12:00:00       6.4
2012-03-31 13:00:00       6.5
2012-03-31 14:00:00       7.7
2012-03-31 15:00:00       7.7
2012-03-31 16:00:00       8.4
2012-03-31 17:00:00       7.9
2012-03-31 18:00:00       7.0
2012-03-31 19:00:00       5.9
2012-03-31 20:00:00       4.4
2012-03-31 21:00:00       2.6
2012-03-31 22:00:00       2.7
2012-03-31 23:00:00       1.5

[744 rows x 1 columns]>

<matplotlib.axes._subplots.AxesSubplot at 0x7fbac6876b10>


def download_weather_month(year, month):
    if month == 1:
        year += 1
    url = url_template.format(year=year, month=month)
    weather_data = pd.read_csv(url, skiprows=15, index_col='Date/Time', parse_dates=True, header=True)
    weather_data = weather_data.dropna(axis=1)
    weather_data.columns = [col.replace('\xb0', '') for col in weather_data.columns]
    weather_data = weather_data.drop(['Year', 'Day', 'Month', 'Time', 'Data Quality'], axis=1)
    return weather_data


download_weather_month(2012, 1)[:5]


data_by_month = [download_weather_month(2012, i) for i in range(1, 13)]


weather_2012 = pd.concat(data_by_month)
weather_2012


weather_2012.to_csv('../data/weather_2012.csv')

	Date/Time	Temp (C)	Dew Point Temp (C)	Rel Hum (%)	Wind Spd (km/h)	Visibility (km)	Stn Press (kPa)	Weather
0	2012-01-01 00:00:00	-1.8	-3.9	86	4	8.0	101.24	Fog
1	2012-01-01 01:00:00	-1.8	-3.7	87	4	8.0	101.24	Fog
2	2012-01-01 02:00:00	-1.8	-3.4	89	7	4.0	101.26	Freezing Drizzle,Fog
3	2012-01-01 03:00:00	-1.5	-3.2	88	6	4.0	101.27	Freezing Drizzle,Fog
4	2012-01-01 04:00:00	-1.5	-3.3	88	7	4.8	101.23	Fog
...	...	...	...	...	...	...	...	...
8779	2012-12-31 19:00:00	0.1	-2.7	81	30	9.7	100.13	Snow
8780	2012-12-31 20:00:00	0.2	-2.4	83	24	9.7	100.03	Snow
8781	2012-12-31 21:00:00	-0.5	-1.5	93	28	4.8	99.95	Snow
8782	2012-12-31 22:00:00	-0.2	-1.8	89	28	9.7	99.91	Snow
8783	2012-12-31 23:00:00	0.0	-2.1	86	30	11.3	99.89	Snow

	Temp (C)	Dew Point Temp (C)	Rel Hum (%)	Wind Spd (km/h)	Visibility (km)	Stn Press (kPa)	Weather
Date/Time
2012-03-01 00:00:00	-5.5	-9.7	72	24	4.0	100.97	Snow
2012-03-01 01:00:00	-5.7	-8.7	79	26	2.4	100.87	Snow
2012-03-01 02:00:00	-5.4	-8.3	80	28	4.8	100.80	Snow
2012-03-01 03:00:00	-4.7	-7.7	79	28	4.0	100.69	Snow
2012-03-01 04:00:00	-5.4	-7.8	83	35	1.6	100.62	Snow

	Temp (C)	Dew Point Temp (C)	Rel Hum (%)	Wind Spd (km/h)	Visibility (km)	Stn Press (kPa)	Weather
Date/Time
2013-01-01 00:00:00	-1.0	-1.7	95	35	6.4	99.89	Snow
2013-01-01 01:00:00	-2.0	-5.1	79	35	16.1	99.93	Mainly Clear
2013-01-01 02:00:00	-2.7	-6.0	78	28	19.3	100.08	Snow
2013-01-01 03:00:00	-5.6	-11.7	62	30	25.0	100.21	Clear
2013-01-01 04:00:00	-7.7	-12.6	68	35	19.3	100.32	Mainly Clear

	Temp (C)	Dew Point Temp (C)	Rel Hum (%)	Wind Spd (km/h)	Visibility (km)	Stn Press (kPa)	Weather
Date/Time
2013-01-01 00:00:00	-1.0	-1.7	95	35	6.4	99.89	Snow
2013-01-01 01:00:00	-2.0	-5.1	79	35	16.1	99.93	Mainly Clear
2013-01-01 02:00:00	-2.7	-6.0	78	28	19.3	100.08	Snow
2013-01-01 03:00:00	-5.6	-11.7	62	30	25.0	100.21	Clear
2013-01-01 04:00:00	-7.7	-12.6	68	35	19.3	100.32	Mainly Clear
2013-01-01 05:00:00	-9.7	-14.8	66	33	25.0	100.47	Clear
2013-01-01 06:00:00	-11.1	-17.0	62	30	25.0	100.65	Clear
2013-01-01 07:00:00	-12.2	-17.2	66	20	25.0	100.78	Clear
2013-01-01 08:00:00	-13.0	-17.7	68	13	24.1	100.87	Clear
2013-01-01 09:00:00	-13.0	-17.3	70	20	24.1	100.86	Clear
2013-01-01 10:00:00	-12.6	-17.8	65	19	24.1	100.90	Clear
2013-01-01 11:00:00	-12.2	-17.6	64	22	24.1	100.88	Mainly Clear
2013-01-01 12:00:00	-11.8	-17.2	64	26	24.1	100.87	Mainly Clear
2013-01-01 13:00:00	-11.3	-17.4	61	26	24.1	100.83	Mainly Clear
2013-01-01 14:00:00	-11.3	-17.4	61	28	24.1	100.82	Mainly Clear
2013-01-01 15:00:00	-11.4	-17.6	60	30	24.1	100.85	Mainly Clear
2013-01-01 16:00:00	-12.0	-18.0	61	22	24.1	100.81	Mainly Clear
2013-01-01 17:00:00	-13.0	-18.4	64	19	25.0	100.90	Clear
2013-01-01 18:00:00	-13.4	-18.4	66	24	25.0	100.96	Clear
2013-01-01 19:00:00	-14.1	-18.7	68	20	25.0	101.02	Clear
2013-01-01 20:00:00	-14.3	-19.0	67	15	25.0	101.04	Clear
2013-01-01 21:00:00	-14.8	-19.5	67	15	25.0	100.98	Mainly Clear
2013-01-01 22:00:00	-16.3	-20.2	72	7	25.0	100.98	Mostly Cloudy
2013-01-01 23:00:00	-15.4	-19.8	69	11	25.0	100.99	Cloudy
2013-01-02 00:00:00	-14.0	-18.4	69	11	19.3	100.96	Snow
2013-01-02 01:00:00	-14.1	-18.3	70	11	25.0	100.91	Mostly Cloudy
2013-01-02 02:00:00	-14.3	-18.3	72	13	25.0	100.94	Snow Showers
2013-01-02 03:00:00	-14.7	-18.0	76	9	19.3	100.91	Snow
2013-01-02 04:00:00	-14.2	-17.1	79	6	9.7	100.83	Snow
2013-01-02 05:00:00	-14.3	-17.0	80	0	6.4	100.81	Snow
...	...	...	...	...	...	...	...
2012-12-30 18:00:00	-12.6	-16.0	76	24	25.0	101.36	Mainly Clear
2012-12-30 19:00:00	-13.4	-16.5	77	26	25.0	101.47	Mainly Clear
2012-12-30 20:00:00	-13.8	-16.5	80	24	25.0	101.52	Clear
2012-12-30 21:00:00	-13.8	-16.5	80	20	25.0	101.50	Mainly Clear
2012-12-30 22:00:00	-13.7	-16.3	81	19	25.0	101.54	Mainly Clear
2012-12-30 23:00:00	-12.1	-15.1	78	28	25.0	101.52	Mostly Cloudy
2012-12-31 00:00:00	-11.1	-14.4	77	26	25.0	101.51	Cloudy
2012-12-31 01:00:00	-10.7	-14.0	77	15	25.0	101.50	Cloudy
2012-12-31 02:00:00	-10.1	-13.4	77	9	25.0	101.45	Cloudy
2012-12-31 03:00:00	-11.8	-14.4	81	6	25.0	101.42	Mostly Cloudy
2012-12-31 04:00:00	-10.5	-12.8	83	11	25.0	101.34	Cloudy
2012-12-31 05:00:00	-10.2	-12.4	84	6	25.0	101.28	Cloudy
2012-12-31 06:00:00	-9.7	-11.7	85	4	25.0	101.23	Cloudy
2012-12-31 07:00:00	-9.3	-11.3	85	0	19.3	101.19	Snow Showers
2012-12-31 08:00:00	-8.6	-10.3	87	4	3.2	101.14	Snow Showers
2012-12-31 09:00:00	-8.1	-9.6	89	4	2.4	101.09	Snow
2012-12-31 10:00:00	-7.4	-8.9	89	4	6.4	101.05	Snow,Fog
2012-12-31 11:00:00	-6.7	-7.9	91	9	9.7	100.93	Snow
2012-12-31 12:00:00	-5.8	-7.5	88	4	12.9	100.78	Snow
2012-12-31 13:00:00	-4.6	-6.6	86	4	12.9	100.63	Snow
2012-12-31 14:00:00	-3.4	-5.7	84	6	11.3	100.57	Snow
2012-12-31 15:00:00	-2.3	-4.6	84	9	9.7	100.47	Snow
2012-12-31 16:00:00	-1.4	-4.0	82	13	12.9	100.40	Snow
2012-12-31 17:00:00	-1.1	-3.3	85	19	9.7	100.30	Snow
2012-12-31 18:00:00	-1.3	-3.1	88	17	9.7	100.19	Snow
2012-12-31 19:00:00	0.1	-2.7	81	30	9.7	100.13	Snow
2012-12-31 20:00:00	0.2	-2.4	83	24	9.7	100.03	Snow
2012-12-31 21:00:00	-0.5	-1.5	93	28	4.8	99.95	Snow
2012-12-31 22:00:00	-0.2	-1.8	89	28	9.7	99.91	Snow
2012-12-31 23:00:00	0.0	-2.1	86	30	11.3	99.89	Snow

Summary¶

5.1 Downloading one month of weather data¶

5.2 Plotting the temperature by hour of day¶

5.3 Getting the whole year of data¶

5.4 Saving to a CSV¶

	Year	Month	Day	Time	Temp (C)	Dew Point Temp (C)	Rel Hum (%)	Wind Spd (km/h)	Visibility (km)	Stn Press (kPa)	Weather
Date/Time
2012-03-01 00:00:00	2012	3	1	00:00	-5.5	-9.7	72	24	4.0	100.97	Snow
2012-03-01 01:00:00	2012	3	1	01:00	-5.7	-8.7	79	26	2.4	100.87	Snow
2012-03-01 02:00:00	2012	3	1	02:00	-5.4	-8.3	80	28	4.8	100.80	Snow
2012-03-01 03:00:00	2012	3	1	03:00	-4.7	-7.7	79	28	4.0	100.69	Snow
2012-03-01 04:00:00	2012	3	1	04:00	-5.4	-7.8	83	35	1.6	100.62	Snow